multistep-word-problems:
  id: multistep-word-problems.dev.v0
  description: Test the model's ability to solve complex, multistep math word problems
  metrics: [accuracy]

multistep-word-problems.dev.v0:
  class: evals.elsuite.basic.match:Match
  args:
    samples_jsonl: multistep-word-problems/samples.jsonl
